CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 HF_ENDPOINT=https://hf-mirror.com python src/sft.py \
--model_name_or_path deepseek-ai/deepseek-llm-7b-base \
--output_dir models/deepseek-llm-7b-instruct2 \
--dataset_name llamafactory/alpaca_gpt4_zh,llamafactory/alpaca_gpt4_en,shibing624/sharegpt_gpt4 \
--gradient_accumulation_steps 16 --sampling 0.03 --save_steps 50 --eval_steps 10 --check_steps 5